import wav2clip
import librosa
audio_path = "./data/trainset/0/0afa3112-057d-4edc-97dd-71655cfc745b.wav"
audio, sample_rate = librosa.load(audio_path, sr=None)
model = wav2clip.get_model()
embeddings = wav2clip.embed_audio(audio, model)
print(embeddings.shape)